library(haven)

# Load in Data set
impdat20_bw <- read_spss("./Data/Race.IAT.public.2020.sav")
# Subset to USA
impdat20_bw <- subset(impdat20_bw, countryres_num == 1)

# Meta Info ---------------------------------------------------------------
impdat20_bw$date_mdy <- format(impdat20_bw$date, "%Y-%m-%d")
impdat20_bw$date_mdy <- as.Date(impdat20_bw$date_mdy)
impdat20_bw$week <- format(as.Date(impdat20_bw$date), "%W")
impdat20_bw$week_52 <- impdat20_bw$week
impdat20_bw$week_52[which(impdat20_bw$week_52 == "00")] <- "01"

# Demographics ---------------------------------------------------------------
# Age
impdat20_bw$age[which(impdat20_bw$birthyear > 1900)] <- impdat20_bw$year[which(impdat20_bw$birthyear > 1900)] - impdat20_bw$birthyear[which(impdat20_bw$birthyear > 1900)]
impdat20_bw$age_sc <- (impdat20_bw$age-min(impdat20_bw$age, na.rm = T))/(max(impdat20_bw$age, na.rm = T)-min(impdat20_bw$age, na.rm = T))

impdat20_bw$age_cat4 <- NA
impdat20_bw$age_cat4[which(impdat20_bw$age >= 18 & impdat20_bw$age <= 29)] <- "18-29"
impdat20_bw$age_cat4[which(impdat20_bw$age >= 30 & impdat20_bw$age <= 44)] <- "30-44"
impdat20_bw$age_cat4[which(impdat20_bw$age >= 45 & impdat20_bw$age <= 64)] <- "45-64"
impdat20_bw$age_cat4[which(impdat20_bw$age >= 65)] <- "65+"
impdat20_bw$age_cat4 <- as.factor(impdat20_bw$age_cat4)

# Sex
impdat20_bw$sex <- NA
impdat20_bw$sex[which(impdat20_bw$birthSex == 2)] <- "f"
impdat20_bw$sex[which(impdat20_bw$birthSex == 1)] <- "m"

# Race and Ethnicity
impdat20_bw$race <- factor(impdat20_bw$raceomb002, 
                           levels = c(1:max(impdat20_bw$raceomb002, na.rm = T)),
                           labels = c("American Indian/Alaskan Native",
                                      "East Asian",
                                      "South Asian",
                                      "Native Hawaiian/Pacific Islander",
                                      "Black",
                                      "White",
                                      "Other", 
                                      "Multiracial"))

impdat20_bw$hisp <- NA
impdat20_bw$hisp[which(impdat20_bw$ethnicityomb == 1)] <- 1
impdat20_bw$hisp[which(impdat20_bw$ethnicityomb == 2)] <- 0 # drops unknowns

impdat20_bw$race5 <- NA
impdat20_bw$race5[which(impdat20_bw$race %in% c("East Asian", "South Asian", "Native Hawaiian/Pacific Islander") & impdat20_bw$hisp == 0)] <- "Asian/Pacific Islander"
impdat20_bw$race5[which(impdat20_bw$race == "Black" & impdat20_bw$hisp == 0)] <- "Black"
impdat20_bw$race5[which(impdat20_bw$race == "White" & impdat20_bw$hisp == 0)] <- "White"
impdat20_bw$race5[which(impdat20_bw$race %in% c("Other", "Multiracial") & impdat20_bw$hisp == 0)] <- "Other"
impdat20_bw$race5[which(impdat20_bw$hisp == 1)] <- "Hispanic"
impdat20_bw$race5 <- as.factor(impdat20_bw$race5)
impdat20_bw$race5 <- factor(impdat20_bw$race5, levels(impdat20_bw$race5)[c(1:3,5,4)])

impdat20_bw$race3 <- NA
impdat20_bw$race3[which(impdat20_bw$race5 == "White")] <- "White"
impdat20_bw$race3[which(impdat20_bw$race5 == "Black")] <- "Black"
impdat20_bw$race3[which(impdat20_bw$race5 != "Black" & impdat20_bw$race5 != "White")] <- "Other"

# Ideology
impdat20_bw$ideo3 <- NA
impdat20_bw$ideo3[which(impdat20_bw$politicalid_7 < 4)] <- 1
impdat20_bw$ideo3[which(impdat20_bw$politicalid_7 == 4)] <- 0
impdat20_bw$ideo3[which(impdat20_bw$politicalid_7 > 4)] <- -1
impdat20_bw$ideo3_lab <- factor(impdat20_bw$ideo3,
                                labels = c("liberal", "moderate", "conservative"))

impdat20_bw$ideo_lib <- ifelse(impdat20_bw$ideo3 == -1, 1, 0)
impdat20_bw$ideo_mod <- ifelse(impdat20_bw$ideo3 == 0, 1, 0)
impdat20_bw$ideo_con <- ifelse(impdat20_bw$ideo3 == 1, 1, 0)

impdat20_bw$ideo7 <- impdat20_bw$politicalid_7*-1 + 7
impdat20_bw$ideo7_sc <- impdat20_bw$ideo7/6

# Region
impdat20_bw$south <- NA
impdat20_bw$south <- ifelse(impdat20_bw$STATE %in% c("VA", "NC", "SC", "GA", "FL", "MS", "AL", "TN", "AR", "LA", "TX"),
                            1, 0)
impdat20_bw$south[impdat20_bw$STATE == ""] <- NA

impdat20_bw$census_region <- NA
impdat20_bw$census_region[which(impdat20_bw$STATE %in% c("DE", "MD", "DC", "WV", "KY", "OK",
                                                         "VA", "NC", "SC", "GA", "FL", "MS", "AL", 
                                                         "TN", "AR", "LA", "TX"))] <- "South"
impdat20_bw$census_region[which(impdat20_bw$STATE %in% c("CA", "OR", "WA", "MT", "WY",
                                                         "ID", "CO", "UT", "AZ", "NM",
                                                         "NV", "AK", "HI"))] <- "West"
impdat20_bw$census_region[which(impdat20_bw$STATE %in% c("ND", "SD", "MN", "WI",
                                                         "IA", "NE", "KS", "MO",
                                                         "IL", "IN", "MI", "OH"))] <- "Midwest"
impdat20_bw$census_region[which(impdat20_bw$STATE %in% c("ME", "VT", "NH", "MA", "RI",
                                                         "CT", "NY", "NJ", "PA"))] <- "Northeast"
impdat20_bw$census_region[impdat20_bw$STATE == ""] <- NA
impdat20_bw$census_region <- as.factor(impdat20_bw$census_region)

# Education
impdat20_bw$edu_cat <- NA
impdat20_bw$edu_cat[which(impdat20_bw$edu <= 3)] <- 1 # Less than HS
impdat20_bw$edu_cat[which(impdat20_bw$edu == 4)] <- 2 # HS 
impdat20_bw$edu_cat[which(impdat20_bw$edu == 5 | impdat20_bw$edu == 6)] <- 3 # Some college or associates
impdat20_bw$edu_cat[which(impdat20_bw$edu == 7)] <- 4 # College
impdat20_bw$edu_cat[which(impdat20_bw$edu >= 8)] <- 5 # Adv degree or schooling
impdat20_bw$col <- ifelse(impdat20_bw$edu_cat >= 4, 1, 0)

impdat20_bw$edu_cat4 <- NA
impdat20_bw$edu_cat4[which(impdat20_bw$edu_cat <= 2)] <- "HS or Less"
impdat20_bw$edu_cat4[which(impdat20_bw$edu_cat == 3)] <- "Some College"
impdat20_bw$edu_cat4[which(impdat20_bw$edu_cat == 4)] <- "College"
impdat20_bw$edu_cat4[which(impdat20_bw$edu_cat == 5)] <- "Post-Grad"
impdat20_bw$edu_cat4 <- factor(impdat20_bw$edu_cat4,
                               levels = c("HS or Less",
                                          "Some College",
                                          "College",
                                          "Post-Grad"))

# Reason for Visiting
# impdat20_bw$broughtwebsite
impdat20_bw$broughtwebsite2 <- NA
impdat20_bw$broughtwebsite2[which(impdat20_bw$broughtwebsite %in% c("Assignment for school", "Assignment for work"))] <- "Assignment school/work"
impdat20_bw$broughtwebsite2[which(impdat20_bw$broughtwebsite %in% c("Mention in a news story (any medium)"))] <- "News Mention"
impdat20_bw$broughtwebsite2[which(impdat20_bw$broughtwebsite %in% c("My Internet search for this topic or a related topic", "Mention or link at a non-news Internet site"))] <- "Internet Mention/Search"
impdat20_bw$broughtwebsite2[which(impdat20_bw$broughtwebsite %in% "Recommendation of a friend or co-worker")] <- "Peer Recommendation"
impdat20_bw$broughtwebsite2[which(impdat20_bw$broughtwebsite %in% c("Other", "null"))] <- "Other/null"

impdat20_bw$broughtwebsite2 <- as.factor(impdat20_bw$broughtwebsite2)

# Interview Date Indicators -----------------------------------------------
impdat20_bw$post_gf <- ifelse(impdat20_bw$date_mdy > "2020-05-25", 1, 0)
impdat20_bw$post_gf_1month <- ifelse(impdat20_bw$date_mdy > "2020-05-25" & impdat20_bw$date_mdy <= "2020-06-26", 
                                     1, 0)
impdat20_bw$post_gf_2month <- ifelse(impdat20_bw$date_mdy > "2020-06-26" & impdat20_bw$date_mdy <= "2020-07-26", 
                                     1, 0)
impdat20_bw$post_gf_3month <- ifelse(impdat20_bw$date_mdy > "2020-07-26" & impdat20_bw$date_mdy <= "2020-08-26", 
                                     1, 0)


# Attitudes ---------------------------------------------------------------
# Thermometers
impdat20_bw$tblack_sc <- impdat20_bw$Tblack_0to10/10
impdat20_bw$twhite_sc <- impdat20_bw$Twhite_0to10/10

impdat20_bw$t_wb <- (impdat20_bw$twhite_sc - impdat20_bw$tblack_sc)

# D Score
# Per email communication
impdat20_bw$IAT_D <- NA
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all < -.65)] <- "Strong Black"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all >= -.65 & impdat20_bw$D_biep.White_Good_all <= -.35)] <- "Moderate Black"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all > -.35 & impdat20_bw$D_biep.White_Good_all <= -.15)] <- "Slight Black"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all > -.15 & impdat20_bw$D_biep.White_Good_all < 0)] <- "Little or No Black"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all >= 0 & impdat20_bw$D_biep.White_Good_all < .15)] <- "Little or No White"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all >= .15 & impdat20_bw$D_biep.White_Good_all < .35)] <- "Slight White"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all >= .35 & impdat20_bw$D_biep.White_Good_all <= .65)] <- "Moderate White"
impdat20_bw$IAT_D[which(impdat20_bw$D_biep.White_Good_all > .65)] <- "Strong White"
impdat20_bw$IAT_D <- factor(impdat20_bw$IAT_D,
                            levels = c("Strong Black", "Medium Black", "Slight Black",
                                       "Little or No Black", "Little or No White",
                                       "Slight White", "Medium White", "Strong White"))


